{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 55,
   "id": "f8007a0b",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-24T10:30:52.081110Z",
     "start_time": "2023-06-24T10:30:48.051661Z"
    }
   },
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "import json\n",
    "import pandas as pd\n",
    "\n",
    "\n",
    "url = \"https://api-c.liepin.com/api/com.liepin.searchfront4c.pc-search-job\"\n",
    "payload = {\n",
    "    \"data\":{\n",
    "        \"mainSearchPcConditionForm\": {\n",
    "            \"city\": \"050020\",\n",
    "            \"dq\": \"050020\",\n",
    "            \"pubTime\": \"\",\n",
    "            \"currentPage\": 1,\n",
    "            \"pageSize\": 40,\n",
    "            \"key\": \"前端开发\",\n",
    "            \"suggestTag\": \"\",\n",
    "            \"workYearCode\": \"0\",\n",
    "            \"compId\": \"\",\n",
    "            \"compName\": \"\",\n",
    "            \"compTag\": \"\",\n",
    "            \"industry\": \"\",\n",
    "            \"salary\": \"\",\n",
    "            \"jobKind\": \"\",\n",
    "            \"compScale\": \"\",\n",
    "            \"compKind\": \"\",\n",
    "            \"compStage\": \"\",\n",
    "            \"eduLevel\": \"\"\n",
    "        },\n",
    "        \"passThroughForm\": {\n",
    "            \"scene\": \"condition\",\n",
    "            \"skId\": \"mj3mjyy64uu45jg1qtn9pzprjvuhoyc8\",\n",
    "            \"fkId\": \"mj3mjyy64uu45jg1qtn9pzprjvuhoyc8\",\n",
    "            \"ckId\": \"ih4fd3x0qhs56f3x2u9ne0alw9j14kia\",\n",
    "            \"suggest\": None\n",
    "        }\n",
    "    }\n",
    "}\n",
    "\n",
    "\n",
    "\n",
    "# create an HTML session using Requests-HTML\n",
    "session = HTMLSession()\n",
    "\n",
    "# set the headers\n",
    "headers = {\n",
    "    'Accept': 'application/json, text/plain, */*',\n",
    "    'Accept-Encoding': 'gzip, deflate, br',\n",
    "    'Accept-Language': 'zh-CN,zh;q=0.9,zh-TW;q=0.8,en-US;q=0.7,en;q=0.6',\n",
    "    'Connection': 'keep-alive',\n",
    "    'Content-Length': '412',\n",
    "    'Content-Type': 'application/json;charset=UTF-8;',\n",
    "    'Cookie': '__gc_id=f500dd7cb42648e1a2714029f702540f; __uuid=1680246346233.95; _ga=GA1.1.1352270155.1682058969; need_bind_tel=false; c_flag=3b526044dc9ca4cc969fe64335a37d51; imClientId=dff6fc07f54a6bed9245bc83c25defde; imId=dff6fc07f54a6bedb656b942dce8623e; imClientId_0=dff6fc07f54a6bed9245bc83c25defde; imId_0=dff6fc07f54a6bedb656b942dce8623e; new_user=false; __tlog=1687345768976.39%7C00000000%7C00000000%7Cs_00_t00%7Cs_00_t00; XSRF-TOKEN=GHNWHeAGTH2jWhn0r832rg; UniqueKey=44c0232e8b551e826bc56763ae71c6f2; liepin_login_valid=0; lt_auth=s7wNMyEHmlSs7XnY2DZb7a1LiN6sWW3O%2FH4Ngh9V1YC6CvKw4P%2FmQA%2BFq7MG%2BCoIqxknJa4zMLb2Muv6zHtL6kMW%2FFGnlZ6utf6k1X4eTu1nHuyflMXuqsjQQJgirXo6ykpgn2si0HU%3D; inited_user=5992e0c0c9715067fd467126be5f93ce; user_roles=0; user_photo=5f8fa3baf6d1ab58476f324908u.png; user_name=%E5%91%A8%E6%BA%90; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1685965243,1687345811; acw_tc=276077bb16873458115691907e2882a35ef69d6d066b467094499a47c71496; imApp_0=1; __session_seq=3; __uv_seq=3; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1687345822; fe_im_socketSequence_new_0=2_2_2; fe_im_opened_pages=; fe_im_connectJson_0=%7B%220_44c0232e8b551e826bc56763ae71c6f2%22%3A%7B%22socketConnect%22%3A%222%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D; _ga_54YTJKWN86=GS1.1.1687345821.3.1.1687345849.0.0.0',\n",
    "    'Host': 'api-c.liepin.com',\n",
    "    'Origin': 'https://www.liepin.com',\n",
    "    'Referer': 'https://www.liepin.com/',\n",
    "    'sec-ch-ua': '\"\"Not.A/Brand\";v=\"8\", \"Chromium\";v=\"114\", \"Google Chrome\";v=\"114\"\"',\n",
    "    'sec-ch-ua-mobile': '?0',\n",
    "    'sec-ch-ua-platform': '\"Windows\"',\n",
    "    'Sec-Fetch-Dest': 'empty',\n",
    "    'Sec-Fetch-Mode': 'cors',\n",
    "    'Sec-Fetch-Site': 'same-site',\n",
    "    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36',\n",
    "    'X-Client-Type': 'web',\n",
    "    'X-Fscp-Bi-Stat': '{\"location\": \"https://www.liepin.com/zhaopin/?inputFrom=c_index&workYearCode=1&key=%E5%89%8D%E7%AB%AF%E5%BC%80%E5%8F%91&scene=input&ckId=yc643cafb4izh5tvgqvjxu9fdtxhg5q9&\"}',\n",
    "    'X-Fscp-Fe-Version': '',\n",
    "    'X-Fscp-Std-Info': '{\"client_id\": \"40108\"}',\n",
    "    'X-Fscp-Trace-Id': '9c605930-a30e-48f0-b21b-d81be0de8519',\n",
    "    'X-Fscp-Version': '1.1',\n",
    "    'X-Requested-With': 'XMLHttpRequest',\n",
    "    'X-XSRF-TOKEN': 'GHNWHeAGTH2jWhn0r832rg'\n",
    "}\n",
    "\n",
    "# send a POST request with headers\n",
    "shuju = []\n",
    "for i in range(13):\n",
    "    payload['data']['mainSearchPcConditionForm']['currentPage'] = i\n",
    "    r = session.post(url, data=json.dumps(payload), headers=headers)\n",
    "    # extract the JSON data from the response\n",
    "    response_data = r.json()\n",
    "    shuju1 = pd.json_normalize(response_data['data']['data'])\n",
    "    shuju.append(shuju1)\n",
    "# example: print the number of job postings returned\n",
    "# print(response_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "id": "7aeca320",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-24T10:30:57.377629Z",
     "start_time": "2023-06-24T10:30:57.212040Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[                                         jobCardList compList\n",
       " 0  [{'dataParams': '{\"imId\":\"98edf36b7f36d00f4a7a...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'recruiter': {'recruiterName': '陈先生', 'recru...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'comp': {'compId': 8805672, 'compScale': '50...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'job': {'labels': ['前端开发', 'Vue', '界面开发', '框...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'job': {'labels': ['前端开发', '大数据领域', 'ECMAScr...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'dataParams': '{\"imId\":\"37e868f3e9f307ad59a7...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'dataInfo': '%7B%22sfrom%22%3A%22search_job_...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'job': {'labels': ['前端开发', '架构设计', '界面开发', '...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'dataInfo': '%7B%22jobId%22%3A%2232128779%22...       [],\n",
       "                                          jobCardList compList\n",
       " 0  [{'dataParams': '{\"jobKind\":\"2\",\"jobId\":\"20510...       [],\n",
       " Empty DataFrame\n",
       " Columns: []\n",
       " Index: [0],\n",
       " Empty DataFrame\n",
       " Columns: []\n",
       " Index: [0],\n",
       " Empty DataFrame\n",
       " Columns: []\n",
       " Index: [0]]"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "shuju"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "id": "ef5d9f70",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-24T10:31:01.358474Z",
     "start_time": "2023-06-24T10:31:01.337522Z"
    },
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['jobCardList', 'compList'], dtype='object')"
      ]
     },
     "execution_count": 57,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_shuju = pd.concat(shuju)\n",
    "new_shuju.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "753265fa",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-21T11:23:40.265437Z",
     "start_time": "2023-06-21T11:23:40.214610Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.refreshTime</th>\n",
       "      <th>job.jobId</th>\n",
       "      <th>job.jobKind</th>\n",
       "      <th>job.title</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>...</th>\n",
       "      <th>recruiter.recruiterPhoto</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.requireEduLevel</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>%7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...</td>\n",
       "      <td>{\"imId\":\"30ab872ce6a2dc3613d8a6ef9551fb50\",\"im...</td>\n",
       "      <td>[学历不限, 前端开发]</td>\n",
       "      <td>20230113164340</td>\n",
       "      <td>51235411</td>\n",
       "      <td>6</td>\n",
       "      <td>Web前端开发工程师</td>\n",
       "      <td>12-16k·14薪</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f98648dbe6273dcf8515508u.jpg</td>\n",
       "      <td>9386110.0</td>\n",
       "      <td>62906f4fb244352e0e92648207u.png</td>\n",
       "      <td>多益网络有限公司</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>https://www.liepin.com/company/9386110/</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>%7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...</td>\n",
       "      <td>{\"imId\":\"8951c85dd8b85b3c062c1b1ee9c7454d\",\"im...</td>\n",
       "      <td>[本科, 前端开发, jQuery, 界面开发, Vue, ElementUI, Node....</td>\n",
       "      <td>20211214164804</td>\n",
       "      <td>42727089</td>\n",
       "      <td>6</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>7-12k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州</td>\n",
       "      <td>...</td>\n",
       "      <td>54d1e78d712eb4f6b84c788f02c.jpg</td>\n",
       "      <td>8086509.0</td>\n",
       "      <td>5bfe91b674719d35745ae24c03a.png</td>\n",
       "      <td>凯普生物</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>https://www.liepin.com/company/8086509/</td>\n",
       "      <td>制药</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>%7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...</td>\n",
       "      <td>{\"imId\":\"9ac77eac63b17fd2337193710fe42056\",\"im...</td>\n",
       "      <td>[本科, 前端开发, 框架开发, 框架设计, Bootstrap]</td>\n",
       "      <td>20220908120814</td>\n",
       "      <td>52128303</td>\n",
       "      <td>6</td>\n",
       "      <td>前端开发（校招）</td>\n",
       "      <td>8-12k·13薪</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>552933.0</td>\n",
       "      <td>5bfea2fc74719d2aa34c73fb03a.png</td>\n",
       "      <td>广东亿迅科技有限公司</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>https://www.liepin.com/company/552933/</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>%7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...</td>\n",
       "      <td>{\"imId\":\"b38e0b86dbeffdd7c62c94f01ec83e9b\",\"im...</td>\n",
       "      <td>[本科, 前端开发, 架构开发, 架构设计, Bootstrap, 模块开发]</td>\n",
       "      <td>20220913185838</td>\n",
       "      <td>52549581</td>\n",
       "      <td>6</td>\n",
       "      <td>前端开发工程师(J12153)</td>\n",
       "      <td>8-16k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9863f6d1ab58476f246a08u.jpg</td>\n",
       "      <td>8010374.0</td>\n",
       "      <td>58da3d3d7032bfe7c3ed63ea05a.jpg</td>\n",
       "      <td>高新兴科技集团股份有限公司</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>https://www.liepin.com/company/8010374/</td>\n",
       "      <td>IT服务</td>\n",
       "      <td>创业板上市</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>%7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...</td>\n",
       "      <td>{\"imId\":\"5f698e933b768c3fc0b855de83315f3c\",\"im...</td>\n",
       "      <td>[本科, 通信领域, 界面开发, 商业信息化, 后端开发, Vue, 系统开发, 框架设计,...</td>\n",
       "      <td>20230328111429</td>\n",
       "      <td>47628285</td>\n",
       "      <td>6</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>10-25k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9865ea60860b75384fa508u.jpg</td>\n",
       "      <td>1552617.0</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>广州三川控制系统工程设备有限公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>https://www.liepin.com/company/1552617/</td>\n",
       "      <td>电气机械/器材</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"jobId\":\"57402437\",\"imId\":\"f27a...</td>\n",
       "      <td>[React]</td>\n",
       "      <td>20230510215528</td>\n",
       "      <td>57402437</td>\n",
       "      <td>2</td>\n",
       "      <td>资深前端开发工程师</td>\n",
       "      <td>20-26k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9866dfb13a7dee342f1808u.jpg</td>\n",
       "      <td>7956170.0</td>\n",
       "      <td>5bfe94be74719dc6ed73fb5a03a.png</td>\n",
       "      <td>佰钧成技术</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>https://www.liepin.com/company/7956170/</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"jobId\":\"51441947\",\"imId\":\"2996...</td>\n",
       "      <td>[前端开发, Javascript, CSS, HTML, React, Web开发]</td>\n",
       "      <td>20220727140759</td>\n",
       "      <td>51441947</td>\n",
       "      <td>2</td>\n",
       "      <td>中高级前端开发工程师</td>\n",
       "      <td>12-18k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>...</td>\n",
       "      <td>62da47dc83876966f0d58fcf08u.png</td>\n",
       "      <td>8634915.0</td>\n",
       "      <td>63944509821c6d513110d6e403u.png</td>\n",
       "      <td>佰聆数据股份有限公司</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>https://www.liepin.com/company/8634915/</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"jobId\":\"51567365\",\"imId\":\"12b5...</td>\n",
       "      <td>[Web开发, 前端开发, Javascript, Angular, nestjs]</td>\n",
       "      <td>20220802103324</td>\n",
       "      <td>51567365</td>\n",
       "      <td>2</td>\n",
       "      <td>WEB前端开发</td>\n",
       "      <td>5-10k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f9868f6d1ab58476f24a008u.jpg</td>\n",
       "      <td>12666301.0</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>裂变科技(广州)有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>https://www.liepin.com/company/12666301/</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>学历不限</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"jobId\":\"58984835\",\"imId\":\"5906...</td>\n",
       "      <td>[前端开发, jQuery, 界面开发, React, CSS, HTML, R语言]</td>\n",
       "      <td>20230608152044</td>\n",
       "      <td>58984835</td>\n",
       "      <td>2</td>\n",
       "      <td>前端开发工程师-五险一金13薪</td>\n",
       "      <td>16-23k·13薪</td>\n",
       "      <td>False</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>...</td>\n",
       "      <td>5f8f986c79c7cc70efbf36c808u.jpg</td>\n",
       "      <td>13521485.0</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>前海豆米</td>\n",
       "      <td></td>\n",
       "      <td>https://www.liepin.com/company/13521485/</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>%7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...</td>\n",
       "      <td>{\"jobKind\":\"2\",\"jobId\":\"57110857\",\"imId\":\"1315...</td>\n",
       "      <td>[界面开发, Node.js, React, 前端开发, Vue, MVVM, Angula...</td>\n",
       "      <td>20230320143422</td>\n",
       "      <td>57110857</td>\n",
       "      <td>2</td>\n",
       "      <td>Web前端开发工程师</td>\n",
       "      <td>8-12k</td>\n",
       "      <td>False</td>\n",
       "      <td>广州</td>\n",
       "      <td>...</td>\n",
       "      <td>54d1e787712eb4f6b84c67e301a.jpg</td>\n",
       "      <td>7892457.0</td>\n",
       "      <td>5bfea11474719d2aa34c16b103a.png</td>\n",
       "      <td>易幻网络</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>https://www.liepin.com/company/7892457/</td>\n",
       "      <td>游戏</td>\n",
       "      <td>战略投资</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>本科</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>520 rows × 32 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                             dataInfo  \\\n",
       "0   %7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...   \n",
       "1   %7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...   \n",
       "2   %7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...   \n",
       "3   %7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...   \n",
       "4   %7B%22pageSize%22%3A%2240%22%2C%22curPage%22%3...   \n",
       "..                                                ...   \n",
       "35  %7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...   \n",
       "36  %7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...   \n",
       "37  %7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...   \n",
       "38  %7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...   \n",
       "39  %7B%22jobKind%22%3A%222%22%2C%22jobId%22%3A%22...   \n",
       "\n",
       "                                           dataParams  \\\n",
       "0   {\"imId\":\"30ab872ce6a2dc3613d8a6ef9551fb50\",\"im...   \n",
       "1   {\"imId\":\"8951c85dd8b85b3c062c1b1ee9c7454d\",\"im...   \n",
       "2   {\"imId\":\"9ac77eac63b17fd2337193710fe42056\",\"im...   \n",
       "3   {\"imId\":\"b38e0b86dbeffdd7c62c94f01ec83e9b\",\"im...   \n",
       "4   {\"imId\":\"5f698e933b768c3fc0b855de83315f3c\",\"im...   \n",
       "..                                                ...   \n",
       "35  {\"jobKind\":\"2\",\"jobId\":\"57402437\",\"imId\":\"f27a...   \n",
       "36  {\"jobKind\":\"2\",\"jobId\":\"51441947\",\"imId\":\"2996...   \n",
       "37  {\"jobKind\":\"2\",\"jobId\":\"51567365\",\"imId\":\"12b5...   \n",
       "38  {\"jobKind\":\"2\",\"jobId\":\"58984835\",\"imId\":\"5906...   \n",
       "39  {\"jobKind\":\"2\",\"jobId\":\"57110857\",\"imId\":\"1315...   \n",
       "\n",
       "                                           job.labels job.refreshTime  \\\n",
       "0                                        [学历不限, 前端开发]  20230113164340   \n",
       "1   [本科, 前端开发, jQuery, 界面开发, Vue, ElementUI, Node....  20211214164804   \n",
       "2                   [本科, 前端开发, 框架开发, 框架设计, Bootstrap]  20220908120814   \n",
       "3             [本科, 前端开发, 架构开发, 架构设计, Bootstrap, 模块开发]  20220913185838   \n",
       "4   [本科, 通信领域, 界面开发, 商业信息化, 后端开发, Vue, 系统开发, 框架设计,...  20230328111429   \n",
       "..                                                ...             ...   \n",
       "35                                            [React]  20230510215528   \n",
       "36        [前端开发, Javascript, CSS, HTML, React, Web开发]  20220727140759   \n",
       "37         [Web开发, 前端开发, Javascript, Angular, nestjs]  20220802103324   \n",
       "38        [前端开发, jQuery, 界面开发, React, CSS, HTML, R语言]  20230608152044   \n",
       "39  [界面开发, Node.js, React, 前端开发, Vue, MVVM, Angula...  20230320143422   \n",
       "\n",
       "   job.jobId job.jobKind        job.title  job.salary  job.topJob  job.dq  \\\n",
       "0   51235411           6       Web前端开发工程师  12-16k·14薪       False  广州-黄埔区   \n",
       "1   42727089           6          前端开发工程师       7-12k       False      广州   \n",
       "2   52128303           6         前端开发（校招）   8-12k·13薪       False  广州-天河区   \n",
       "3   52549581           6  前端开发工程师(J12153)       8-16k       False  广州-黄埔区   \n",
       "4   47628285           6             前端开发      10-25k       False  广州-黄埔区   \n",
       "..       ...         ...              ...         ...         ...     ...   \n",
       "35  57402437           2        资深前端开发工程师      20-26k       False      广州   \n",
       "36  51441947           2       中高级前端开发工程师      12-18k       False  广州-黄埔区   \n",
       "37  51567365           2          WEB前端开发       5-10k       False  广州-番禺区   \n",
       "38  58984835           2  前端开发工程师-五险一金13薪  16-23k·13薪       False  广州-黄埔区   \n",
       "39  57110857           2       Web前端开发工程师       8-12k       False      广州   \n",
       "\n",
       "    ...         recruiter.recruiterPhoto  comp.compId  \\\n",
       "0   ...  5f8f98648dbe6273dcf8515508u.jpg    9386110.0   \n",
       "1   ...  54d1e78d712eb4f6b84c788f02c.jpg    8086509.0   \n",
       "2   ...  5f8f9866dfb13a7dee342f1808u.jpg     552933.0   \n",
       "3   ...  5f8f9863f6d1ab58476f246a08u.jpg    8010374.0   \n",
       "4   ...  5f8f9865ea60860b75384fa508u.jpg    1552617.0   \n",
       "..  ...                              ...          ...   \n",
       "35  ...  5f8f9866dfb13a7dee342f1808u.jpg    7956170.0   \n",
       "36  ...  62da47dc83876966f0d58fcf08u.png    8634915.0   \n",
       "37  ...  5f8f9868f6d1ab58476f24a008u.jpg   12666301.0   \n",
       "38  ...  5f8f986c79c7cc70efbf36c808u.jpg   13521485.0   \n",
       "39  ...  54d1e787712eb4f6b84c67e301a.jpg    7892457.0   \n",
       "\n",
       "                      comp.compLogo     comp.compName comp.compScale  \\\n",
       "0   62906f4fb244352e0e92648207u.png          多益网络有限公司     2000-5000人   \n",
       "1   5bfe91b674719d35745ae24c03a.png              凯普生物     2000-5000人   \n",
       "2   5bfea2fc74719d2aa34c73fb03a.png        广东亿迅科技有限公司     2000-5000人   \n",
       "3   58da3d3d7032bfe7c3ed63ea05a.jpg     高新兴科技集团股份有限公司     2000-5000人   \n",
       "4   61b07937d0458d53c627567e02u.jpg  广州三川控制系统工程设备有限公司         50-99人   \n",
       "..                              ...               ...            ...   \n",
       "35  5bfe94be74719dc6ed73fb5a03a.png             佰钧成技术       10000人以上   \n",
       "36  63944509821c6d513110d6e403u.png        佰聆数据股份有限公司       500-999人   \n",
       "37  61b07937d0458d53c627567e02u.jpg      裂变科技(广州)有限公司          1-49人   \n",
       "38  61b07937d0458d53c627567e02u.jpg              前海豆米                  \n",
       "39  5bfea11474719d2aa34c16b103a.png              易幻网络       500-999人   \n",
       "\n",
       "                                   comp.link comp.compIndustry comp.compStage  \\\n",
       "0    https://www.liepin.com/company/9386110/               互联网            NaN   \n",
       "1    https://www.liepin.com/company/8086509/                制药         沪深A股上市   \n",
       "2     https://www.liepin.com/company/552933/             计算机软件            NaN   \n",
       "3    https://www.liepin.com/company/8010374/              IT服务          创业板上市   \n",
       "4    https://www.liepin.com/company/1552617/           电气机械/器材          融资未公开   \n",
       "..                                       ...               ...            ...   \n",
       "35   https://www.liepin.com/company/7956170/             计算机软件          融资未公开   \n",
       "36   https://www.liepin.com/company/8634915/             计算机软件            NaN   \n",
       "37  https://www.liepin.com/company/12666301/             计算机软件            NaN   \n",
       "38  https://www.liepin.com/company/13521485/               互联网            NaN   \n",
       "39   https://www.liepin.com/company/7892457/                游戏           战略投资   \n",
       "\n",
       "    job.requireWorkYears job.requireEduLevel  \n",
       "0                    NaN                 NaN  \n",
       "1                    NaN                 NaN  \n",
       "2                    NaN                 NaN  \n",
       "3                    NaN                 NaN  \n",
       "4                    NaN                 NaN  \n",
       "..                   ...                 ...  \n",
       "35                  3-5年                  本科  \n",
       "36                  3-5年                  本科  \n",
       "37                  1-3年                学历不限  \n",
       "38                  1-3年                  本科  \n",
       "39                  1-3年                  本科  \n",
       "\n",
       "[520 rows x 32 columns]"
      ]
     },
     "execution_count": 20,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "new_shuju"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "id": "31f5eb04",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-24T10:31:44.070637Z",
     "start_time": "2023-06-24T10:31:44.041315Z"
    }
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>工作名称</th>\n",
       "      <th>工作要求</th>\n",
       "      <th>工作经验</th>\n",
       "      <th>薪资</th>\n",
       "      <th>工作地区</th>\n",
       "      <th>学历要求</th>\n",
       "      <th>是否应届</th>\n",
       "      <th>工作种类</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>公司id</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>公司类型</th>\n",
       "      <th>公司主营</th>\n",
       "      <th>负责人</th>\n",
       "      <th>负责人职位</th>\n",
       "      <th>负责人ID</th>\n",
       "      <th>需要人数</th>\n",
       "      <th>职位信息</th>\n",
       "      <th>公司信息</th>\n",
       "      <th>数据来源</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>Web前端开发工程师</td>\n",
       "      <td>[学历不限, 前端开发]</td>\n",
       "      <td>NaN</td>\n",
       "      <td>12-16k·14薪</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>应届</td>\n",
       "      <td>6</td>\n",
       "      <td>多益网络有限公司</td>\n",
       "      <td>9386110.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>黄女士</td>\n",
       "      <td>HRBP</td>\n",
       "      <td>16fd5ec00a2bfe42455c0853f5145bf2</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/lptjob/51235411</td>\n",
       "      <td>https://www.liepin.com/company/9386110/</td>\n",
       "      <td>%7B%22jobId%22%3A%2251235411%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>[本科, 前端开发, jQuery, 界面开发, Vue, ElementUI, Node....</td>\n",
       "      <td>NaN</td>\n",
       "      <td>7-12k</td>\n",
       "      <td>广州</td>\n",
       "      <td>NaN</td>\n",
       "      <td>应届</td>\n",
       "      <td>6</td>\n",
       "      <td>凯普生物</td>\n",
       "      <td>8086509.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>沪深A股上市</td>\n",
       "      <td>制药</td>\n",
       "      <td>许女士</td>\n",
       "      <td>HR</td>\n",
       "      <td>2f42fd874540276863bd63b74d34940c</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/lptjob/42727089</td>\n",
       "      <td>https://www.liepin.com/company/8086509/</td>\n",
       "      <td>%7B%22jobId%22%3A%2242727089%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>前端开发（校招）</td>\n",
       "      <td>[本科, 前端开发, 框架开发, 框架设计, Bootstrap]</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8-12k·13薪</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>应届</td>\n",
       "      <td>6</td>\n",
       "      <td>广东亿迅科技有限公司</td>\n",
       "      <td>552933.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>NaN</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>唐女士</td>\n",
       "      <td></td>\n",
       "      <td>2199c8dab87ea363c6e6892e6c9d6d59</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/lptjob/52128303</td>\n",
       "      <td>https://www.liepin.com/company/552933/</td>\n",
       "      <td>%7B%22jobId%22%3A%2252128303%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>前端开发工程师(J12153)</td>\n",
       "      <td>[本科, 前端开发, 架构开发, 架构设计, Bootstrap, 模块开发]</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8-16k</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>应届</td>\n",
       "      <td>6</td>\n",
       "      <td>高新兴科技集团股份有限公司</td>\n",
       "      <td>8010374.0</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>创业板上市</td>\n",
       "      <td>IT服务</td>\n",
       "      <td>梁女士</td>\n",
       "      <td>COE负责人</td>\n",
       "      <td>1f7e62b2efae45bcb82117b42621f4e0</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/lptjob/52549581</td>\n",
       "      <td>https://www.liepin.com/company/8010374/</td>\n",
       "      <td>%7B%22jobId%22%3A%2252549581%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>[本科, 通信领域, 界面开发, 商业信息化, 后端开发, Vue, 系统开发, 框架设计,...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>10-25k</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>NaN</td>\n",
       "      <td>应届</td>\n",
       "      <td>6</td>\n",
       "      <td>广州三川控制系统工程设备有限公司</td>\n",
       "      <td>1552617.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>电气机械/器材</td>\n",
       "      <td>王女士</td>\n",
       "      <td>行管部总监</td>\n",
       "      <td>93ce1ae62a2ab0e5d1059d336c2cc2a7</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/lptjob/47628285</td>\n",
       "      <td>https://www.liepin.com/company/1552617/</td>\n",
       "      <td>%7B%22jobId%22%3A%2247628285%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>[javascript, 前端开发, css3, html, ajax, xml]</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-10k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>北京首工科技开发有限公司</td>\n",
       "      <td>8856650.0</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>检测/认证</td>\n",
       "      <td>林先生</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>775fc6c60de91ced483df9caec0e9427</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/job/1936994451.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8856650/</td>\n",
       "      <td>%7B%22jobId%22%3A%2236994451%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>web前端开发维护工程师</td>\n",
       "      <td>[框架设计, 架构设计, 界面开发, Unix, 电商领域, Android, Webpack]</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>6-10k</td>\n",
       "      <td>广州-增城区</td>\n",
       "      <td>大专</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>广州穹之粟智能科技有限公司</td>\n",
       "      <td>12989991.0</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>NaN</td>\n",
       "      <td>专业技术服务</td>\n",
       "      <td>钟先生</td>\n",
       "      <td>董事长</td>\n",
       "      <td>c3eaa5e601847b9559afcd5d8b60bd42</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/job/1945953121.shtml</td>\n",
       "      <td>https://www.liepin.com/company/12989991/</td>\n",
       "      <td>%7B%22jobId%22%3A%2245953121%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>前端开发专家</td>\n",
       "      <td>[前端开发]</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>薪资面议</td>\n",
       "      <td>广州</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>广州宸境科技有限公司</td>\n",
       "      <td>10142141.0</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>A轮</td>\n",
       "      <td>人工智能</td>\n",
       "      <td>胡先生</td>\n",
       "      <td>经理</td>\n",
       "      <td>50760506ba36d95f2295c122c9437964</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/job/1926151723.shtml</td>\n",
       "      <td>https://www.liepin.com/company/10142141/</td>\n",
       "      <td>%7B%22jobId%22%3A%2226151723%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>[前端开发, vue, webpack, windows, 小程序, javascript]</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>大专</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>聚变方成科技</td>\n",
       "      <td>12870175.0</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>天使轮</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>彭先生</td>\n",
       "      <td>CEO,联合创始人</td>\n",
       "      <td>c9335071eb5f495c6f4645e9807dfad9</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/job/1942782719.shtml</td>\n",
       "      <td>https://www.liepin.com/company/12870175/</td>\n",
       "      <td>%7B%22jobId%22%3A%2242782719%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>[javascript, css, 前端开发, react, vue, angular, j...</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-20k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>本科</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>新超硕科技(北京)有限公司</td>\n",
       "      <td>8586384.0</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>NaN</td>\n",
       "      <td>电气机械/器材</td>\n",
       "      <td>陈女士</td>\n",
       "      <td>人力经理</td>\n",
       "      <td>fd51e978b9f2b691c1801803be6280d2</td>\n",
       "      <td>2</td>\n",
       "      <td>https://www.liepin.com/job/1940615695.shtml</td>\n",
       "      <td>https://www.liepin.com/company/8586384/</td>\n",
       "      <td>%7B%22jobId%22%3A%2240615695%22%2C%22jobKind%2...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>160 rows × 20 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "               工作名称                                               工作要求   工作经验  \\\n",
       "0        Web前端开发工程师                                       [学历不限, 前端开发]    NaN   \n",
       "1           前端开发工程师  [本科, 前端开发, jQuery, 界面开发, Vue, ElementUI, Node....    NaN   \n",
       "2          前端开发（校招）                  [本科, 前端开发, 框架开发, 框架设计, Bootstrap]    NaN   \n",
       "3   前端开发工程师(J12153)            [本科, 前端开发, 架构开发, 架构设计, Bootstrap, 模块开发]    NaN   \n",
       "4              前端开发  [本科, 通信领域, 界面开发, 商业信息化, 后端开发, Vue, 系统开发, 框架设计,...    NaN   \n",
       "..              ...                                                ...    ...   \n",
       "35          前端开发工程师          [javascript, 前端开发, css3, html, ajax, xml]   1-3年   \n",
       "36     web前端开发维护工程师   [框架设计, 架构设计, 界面开发, Unix, 电商领域, Android, Webpack]  5-10年   \n",
       "37           前端开发专家                                             [前端开发]  5-10年   \n",
       "38          前端开发工程师     [前端开发, vue, webpack, windows, 小程序, javascript]   3-5年   \n",
       "39          前端开发工程师  [javascript, css, 前端开发, react, vue, angular, j...   1-3年   \n",
       "\n",
       "            薪资    工作地区 学历要求 是否应届 工作种类              公司名称        公司id  \\\n",
       "0   12-16k·14薪  广州-黄埔区  NaN   应届    6          多益网络有限公司   9386110.0   \n",
       "1        7-12k      广州  NaN   应届    6              凯普生物   8086509.0   \n",
       "2    8-12k·13薪  广州-天河区  NaN   应届    6        广东亿迅科技有限公司    552933.0   \n",
       "3        8-16k  广州-黄埔区  NaN   应届    6     高新兴科技集团股份有限公司   8010374.0   \n",
       "4       10-25k  广州-黄埔区  NaN   应届    6  广州三川控制系统工程设备有限公司   1552617.0   \n",
       "..         ...     ...  ...  ...  ...               ...         ...   \n",
       "35       8-10k  广州-番禺区   本科  NaN    2      北京首工科技开发有限公司   8856650.0   \n",
       "36       6-10k  广州-增城区   大专  NaN    2     广州穹之粟智能科技有限公司  12989991.0   \n",
       "37        薪资面议      广州   本科  NaN    2        广州宸境科技有限公司  10142141.0   \n",
       "38      10-15k      广州   大专  NaN    2            聚变方成科技  12870175.0   \n",
       "39      15-20k  广州-天河区   本科  NaN    2     新超硕科技(北京)有限公司   8586384.0   \n",
       "\n",
       "          公司规模    公司类型     公司主营  负责人      负责人职位  \\\n",
       "0   2000-5000人     NaN      互联网  黄女士       HRBP   \n",
       "1   2000-5000人  沪深A股上市       制药  许女士         HR   \n",
       "2   2000-5000人     NaN    计算机软件  唐女士              \n",
       "3   2000-5000人   创业板上市     IT服务  梁女士     COE负责人   \n",
       "4       50-99人   融资未公开  电气机械/器材  王女士      行管部总监   \n",
       "..         ...     ...      ...  ...        ...   \n",
       "35       1-49人   融资未公开    检测/认证  林先生       产品经理   \n",
       "36       1-49人     NaN   专业技术服务  钟先生        董事长   \n",
       "37      50-99人      A轮     人工智能  胡先生         经理   \n",
       "38       1-49人     天使轮    计算机软件  彭先生  CEO,联合创始人   \n",
       "39    500-999人     NaN  电气机械/器材  陈女士       人力经理   \n",
       "\n",
       "                               负责人ID 需要人数  \\\n",
       "0   16fd5ec00a2bfe42455c0853f5145bf2    2   \n",
       "1   2f42fd874540276863bd63b74d34940c    2   \n",
       "2   2199c8dab87ea363c6e6892e6c9d6d59    2   \n",
       "3   1f7e62b2efae45bcb82117b42621f4e0    2   \n",
       "4   93ce1ae62a2ab0e5d1059d336c2cc2a7    2   \n",
       "..                               ...  ...   \n",
       "35  775fc6c60de91ced483df9caec0e9427    2   \n",
       "36  c3eaa5e601847b9559afcd5d8b60bd42    2   \n",
       "37  50760506ba36d95f2295c122c9437964    2   \n",
       "38  c9335071eb5f495c6f4645e9807dfad9    2   \n",
       "39  fd51e978b9f2b691c1801803be6280d2    2   \n",
       "\n",
       "                                           职位信息  \\\n",
       "0        https://www.liepin.com/lptjob/51235411   \n",
       "1        https://www.liepin.com/lptjob/42727089   \n",
       "2        https://www.liepin.com/lptjob/52128303   \n",
       "3        https://www.liepin.com/lptjob/52549581   \n",
       "4        https://www.liepin.com/lptjob/47628285   \n",
       "..                                          ...   \n",
       "35  https://www.liepin.com/job/1936994451.shtml   \n",
       "36  https://www.liepin.com/job/1945953121.shtml   \n",
       "37  https://www.liepin.com/job/1926151723.shtml   \n",
       "38  https://www.liepin.com/job/1942782719.shtml   \n",
       "39  https://www.liepin.com/job/1940615695.shtml   \n",
       "\n",
       "                                        公司信息  \\\n",
       "0    https://www.liepin.com/company/9386110/   \n",
       "1    https://www.liepin.com/company/8086509/   \n",
       "2     https://www.liepin.com/company/552933/   \n",
       "3    https://www.liepin.com/company/8010374/   \n",
       "4    https://www.liepin.com/company/1552617/   \n",
       "..                                       ...   \n",
       "35   https://www.liepin.com/company/8856650/   \n",
       "36  https://www.liepin.com/company/12989991/   \n",
       "37  https://www.liepin.com/company/10142141/   \n",
       "38  https://www.liepin.com/company/12870175/   \n",
       "39   https://www.liepin.com/company/8586384/   \n",
       "\n",
       "                                                 数据来源  \n",
       "0   %7B%22jobId%22%3A%2251235411%22%2C%22jobKind%2...  \n",
       "1   %7B%22jobId%22%3A%2242727089%22%2C%22jobKind%2...  \n",
       "2   %7B%22jobId%22%3A%2252128303%22%2C%22jobKind%2...  \n",
       "3   %7B%22jobId%22%3A%2252549581%22%2C%22jobKind%2...  \n",
       "4   %7B%22jobId%22%3A%2247628285%22%2C%22jobKind%2...  \n",
       "..                                                ...  \n",
       "35  %7B%22jobId%22%3A%2236994451%22%2C%22jobKind%2...  \n",
       "36  %7B%22jobId%22%3A%2245953121%22%2C%22jobKind%2...  \n",
       "37  %7B%22jobId%22%3A%2226151723%22%2C%22jobKind%2...  \n",
       "38  %7B%22jobId%22%3A%2242782719%22%2C%22jobKind%2...  \n",
       "39  %7B%22jobId%22%3A%2240615695%22%2C%22jobKind%2...  \n",
       "\n",
       "[160 rows x 20 columns]"
      ]
     },
     "execution_count": 58,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "exceldata = new_df[\n",
    "    ['job.title','job.labels','job.requireWorkYears','job.salary','job.dq','job.requireEduLevel','job.campusJobKind','job.jobKind','comp.compName','comp.compId','comp.compScale','comp.compStage','comp.compIndustry','recruiter.recruiterName','recruiter.recruiterTitle','recruiter.recruiterId','recruiter.imUserType','job.link','comp.link','dataInfo']\n",
    "]\n",
    "exceldata.columns = ['工作名称','工作要求','工作经验','薪资','工作地区','学历要求','是否应届','工作种类','公司名称','公司id','公司规模','公司类型','公司主营','负责人','负责人职位','负责人ID','需要人数','职位信息','公司信息','数据来源']\n",
    "exceldata"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "id": "58156c53",
   "metadata": {
    "ExecuteTime": {
     "end_time": "2023-06-24T10:26:35.545574Z",
     "start_time": "2023-06-24T10:26:34.590884Z"
    }
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "daochu = pd.DataFrame(exceldata)\n",
    "daochu.to_excel('前端开发行业数据.xlsx',index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e7d3609a",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.4"
  },
  "varInspector": {
   "cols": {
    "lenName": 16,
    "lenType": 16,
    "lenVar": 40
   },
   "kernels_config": {
    "python": {
     "delete_cmd_postfix": "",
     "delete_cmd_prefix": "del ",
     "library": "var_list.py",
     "varRefreshCmd": "print(var_dic_list())"
    },
    "r": {
     "delete_cmd_postfix": ") ",
     "delete_cmd_prefix": "rm(",
     "library": "var_list.r",
     "varRefreshCmd": "cat(var_dic_list()) "
    }
   },
   "types_to_exclude": [
    "module",
    "function",
    "builtin_function_or_method",
    "instance",
    "_Feature"
   ],
   "window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
